Expert(Sto) Return Avg: 12427.49, std: 486.38
array([12258.711, 12900.472, 10293.933, 12324.679, 12312.501, 12536.946,
       12579.71 , 12439.509, 12037.562, 13143.215, 12696.208, 12410.66 ,
       12714.029, 12244.488, 12662.132, 12945.88 , 12545.556, 11920.783,
       12760.411, 12655.707, 12542.178, 12514.93 , 12357.07 , 12783.59 ,
       12130.195, 12822.858, 11546.802, 12826.838, 12990.03 , 11033.234,
       13208.215, 12378.109, 12457.043, 12198.133, 12560.387, 12830.687,
       12058.786, 12250.469, 11458.793, 12540.908, 12651.069, 12433.801,
       12668.406, 12161.804, 12577.811, 12098.953, 11933.758, 12452.899,
       12710.076, 12281.293, 12285.43 , 11511.206, 12455.976, 12447.731,
       12200.233, 12241.609, 12865.379, 13039.216, 12443.003, 13084.916,
       12650.83 , 12622.516, 12621.77 , 13047.351])
Expert(Det) Return Avg: 12231.50, std: 1714.54
array([13392.609, 12932.355, 13057.73 , 12908.568, 12028.123, 12888.124,
       13178.398, 12981.372, 12047.816, 13445.864, 12479.404, 12765.99 ,
       12464.873, 12474.011, 12866.371, 12655.08 , 12935.38 , 13201.221,
       13032.162,  9088.303, 12248.007,  5022.807, 12238.342, 13424.47 ,
       13060.438, 12163.171, 12080.135, 12592.178, 12986.858, 12714.581,
       12510.57 , 12564.037, 12904.775, 13047.999, 12735.466, 12225.967,
       12551.133, 12781.338, 13199.784, 12939.976,  5415.128,  9587.389,
       13333.072, 13012.154, 13123.146, 12402.16 , 12635.329,  7062.029,
       12711.009, 13322.964, 12802.869, 12195.328, 12684.502, 12372.396,
       13048.759,  9752.059, 12786.442, 12688.294,  8497.213, 13134.197,
       12715.255, 11895.964, 13198.252, 13624.276])
ordereddict([('seed', 1), ('cuda', -1), ('env', ordereddict([('env_name', 'HalfCheetahFH-v0'), ('T', 1000)])), ('sac', ordereddict([('epochs', 3000), ('log_step_interval', 5000), ('update_every', 50), ('update_num', 1), ('random_explore_episodes', 10), ('batch_size', 100), ('lr', 0.001), ('alpha', 0.2), ('automatic_alpha_tuning', False), ('buffer_size', 1000000), ('num_test_episodes', 10)])), ('expert', ordereddict([('samples_episode', 64)]))])